{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "ename": "ModuleNotFoundError",
     "evalue": "No module named 'iwillwin'",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mModuleNotFoundError\u001b[0m                       Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-8-f4086f161579>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[1;32mimport\u001b[0m \u001b[0miwillwin\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;31mModuleNotFoundError\u001b[0m: No module named 'iwillwin'"
     ]
    }
   ],
   "source": [
    "import iwillwin"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "root = \"dataset/\"\n",
    "eng_train = root + \"cikm_english_train_20180516.txt\"\n",
    "spn_train = root + \"cikm_spanish_train_20180516.txt\"\n",
    "test = root + \"cikm_test_a_20180516.txt\"\n",
    "unlabeled = root + \"cikm_unlabel_spanish_train_20180516.txt\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>eng_1</th>\n",
       "      <th>spn_1</th>\n",
       "      <th>eng_2</th>\n",
       "      <th>spn_2</th>\n",
       "      <th>label</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>hello, i click in product received</td>\n",
       "      <td>hola, hago clic en el producto recibido</td>\n",
       "      <td>I bought a product and have not received a con...</td>\n",
       "      <td>Compré un producto y no he recibido un correo ...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Hello! I have closed the dispute on may 21, 20...</td>\n",
       "      <td>¡Hola! Cerré la disputa el 21 de mayo de 2017 ...</td>\n",
       "      <td>I did not get refund of my money. Two months h...</td>\n",
       "      <td>No obtuve el reembolso de mi dinero. Han pasad...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>l ordered from spain to spain now they send th...</td>\n",
       "      <td>Ordené de España a España ahora que mandan el ...</td>\n",
       "      <td>My order came but color different from that I ...</td>\n",
       "      <td>Mi pedido llegó pero el color es diferente al ...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Do I need to pay custom duty</td>\n",
       "      <td>¿Debo pagar impuestos personalizados?</td>\n",
       "      <td>How to pay customs duty</td>\n",
       "      <td>Cómo pagar los derechos de aduana</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>I didn't receive my order?</td>\n",
       "      <td>No recibí mi pedido?</td>\n",
       "      <td>My order shows that I have not paid, but I did</td>\n",
       "      <td>Mi pedido muestra que no he pagado, pero lo hice</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>Hi Eva. At first the question. Can I write in ...</td>\n",
       "      <td>Hola Eva Al principio la pregunta. ¿Puedo escr...</td>\n",
       "      <td>How can I write feedback for the goods?</td>\n",
       "      <td>¿Cómo puedo escribir comentarios para los prod...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>I am so angry</td>\n",
       "      <td>estoy tan enojado</td>\n",
       "      <td>I opened a dispute and so far nothing</td>\n",
       "      <td>Abrí una disputa y hasta ahora nada</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>I am not able to open dispute</td>\n",
       "      <td>No puedo abrir una disputa</td>\n",
       "      <td>I am not able to track.</td>\n",
       "      <td>No puedo rastrear.</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>how can I check order number?</td>\n",
       "      <td>¿Cómo puedo verificar el número de pedido?</td>\n",
       "      <td>Where I can see the number of my order tracker?</td>\n",
       "      <td>¿Dónde puedo ver el número de mi rastreador de...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>No, I need an answer from you.</td>\n",
       "      <td>No, necesito una respuesta tuya.</td>\n",
       "      <td>I need an invoice for this item i bought from you</td>\n",
       "      <td>Necesito una factura por este artículo que te ...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>how to reply to dispute</td>\n",
       "      <td>cómo responder a una disputa</td>\n",
       "      <td>How do I reply to feedback?</td>\n",
       "      <td>¿Cómo respondo a los comentarios?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>I DONT NOT LIVE IN CHINA, I LIVE BRAZIL</td>\n",
       "      <td>NO VIVO EN CHINA, VIVO BRASIL</td>\n",
       "      <td>i want live contact now</td>\n",
       "      <td>quiero contacto en vivo ahora</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>What does it mean: Your order will be closed in?</td>\n",
       "      <td>¿Qué significa: su orden será cerrada?</td>\n",
       "      <td>tracking order what does collection mean</td>\n",
       "      <td>orden de seguimiento qué significa colección</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>how to exchange coins</td>\n",
       "      <td>cómo intercambiar monedas</td>\n",
       "      <td>How to change my coins for coupon?</td>\n",
       "      <td>¿Cómo cambiar mis monedas por cupón?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>how do I report a fraud seller</td>\n",
       "      <td>¿Cómo informo a un vendedor de fraude?</td>\n",
       "      <td>I want to report seller</td>\n",
       "      <td>Quiero informar al vendedor</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>Hi I want to buy something but seller have to ...</td>\n",
       "      <td>Hola, quiero comprar algo, pero el vendedor ti...</td>\n",
       "      <td>hi i need to tell u something about my order</td>\n",
       "      <td>hola necesito decirte algo sobre mi orden</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>How do I know whether my order has been shipped</td>\n",
       "      <td>¿Cómo puedo saber si mi pedido ha sido enviado?</td>\n",
       "      <td>How can I know if my order was shipped?</td>\n",
       "      <td>¿Cómo puedo saber si mi pedido fue enviado?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>i cancelled my order with the seller already</td>\n",
       "      <td>cancelé mi pedido con el vendedor ya</td>\n",
       "      <td>I have already paid for my order</td>\n",
       "      <td>Ya pagué mi pedido</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>l ordered from spain to spain now they send th...</td>\n",
       "      <td>Ordené de España a España ahora que mandan el ...</td>\n",
       "      <td>I'm a supplier from china</td>\n",
       "      <td>Soy un proveedor de china</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>I want to do shopping how to buy</td>\n",
       "      <td>Quiero hacer compras cómo comprar</td>\n",
       "      <td>i will come to see you tomorrow</td>\n",
       "      <td>vendré a verte mañana</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>Hi, I live in Canada and I'm currently trackin...</td>\n",
       "      <td>Hola, vivo en Canadá y actualmente estoy rastr...</td>\n",
       "      <td>When can I receive my package after the produc...</td>\n",
       "      <td>¿Cuándo puedo recibir mi paquete después de en...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>The promotion began, but why the price of prod...</td>\n",
       "      <td>La promoción comenzó, pero ¿por qué el precio ...</td>\n",
       "      <td>Why the promotion price is not changed?</td>\n",
       "      <td>¿Por qué el precio de la promoción no se cambia?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>the color number was L</td>\n",
       "      <td>el número de color era L</td>\n",
       "      <td>How can l see my message</td>\n",
       "      <td>¿Cómo puedo ver mi mensaje?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>i have done done all tracking</td>\n",
       "      <td>He hecho todo el seguimiento</td>\n",
       "      <td>I have a dispute and the company has done noth...</td>\n",
       "      <td>Tengo una disputa y la compañía no ha hecho na...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>My forms and documents are not going</td>\n",
       "      <td>Mis formularios y documentos no van</td>\n",
       "      <td>When am I going to receive my orders?</td>\n",
       "      <td>¿Cuándo recibiré mis pedidos?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>how to place order</td>\n",
       "      <td>cómo hacer un pedido</td>\n",
       "      <td>How do I place order?</td>\n",
       "      <td>¿Cómo hago el pedido?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>impossible to join contact customer support</td>\n",
       "      <td>imposible unirse a la atención al cliente de c...</td>\n",
       "      <td>how can I contact customer support?</td>\n",
       "      <td>¿Cómo puedo contactar al servicio de atención ...</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>I want to do shopping how to buy</td>\n",
       "      <td>Quiero hacer compras cómo comprar</td>\n",
       "      <td>What is shopping cart?</td>\n",
       "      <td>¿Qué es un carrito de compras?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>I am not able to open dispute</td>\n",
       "      <td>No puedo abrir una disputa</td>\n",
       "      <td>I am not able to attach a photo for a dispute</td>\n",
       "      <td>No puedo adjuntar una foto para una disputa</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>my order isn't being processed</td>\n",
       "      <td>mi pedido no está siendo procesado</td>\n",
       "      <td>My debit card is not being accepted</td>\n",
       "      <td>Mi tarjeta de débito no está siendo aceptada</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19970</th>\n",
       "      <td>hi, i see this link but i have question.</td>\n",
       "      <td>hola, veo este enlace pero tengo una pregunta.</td>\n",
       "      <td>please i have a question</td>\n",
       "      <td>por favor tengo una pregunta</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19971</th>\n",
       "      <td>ok please. or i can ask the other one.</td>\n",
       "      <td>De acuerdo por favor. o puedo preguntarle al o...</td>\n",
       "      <td>Can I see wish list of other people?</td>\n",
       "      <td>¿Puedo ver la lista de deseos de otras personas?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19972</th>\n",
       "      <td>I paid my order several times, because?</td>\n",
       "      <td>Pagué mi pedido varias veces, porque?</td>\n",
       "      <td>I opened the dispute because I have not receiv...</td>\n",
       "      <td>Abrí la disputa porque no recibí mi número de ...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19973</th>\n",
       "      <td>How do I exchange coins for coupon</td>\n",
       "      <td>¿Cómo cambio monedas por cupón?</td>\n",
       "      <td>How to change my coins for coupon?</td>\n",
       "      <td>¿Cómo cambiar mis monedas por cupón?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19974</th>\n",
       "      <td>link open a dispute</td>\n",
       "      <td>enlace abrir una disputa</td>\n",
       "      <td>how to cancel an open dispute?</td>\n",
       "      <td>cómo cancelar una disputa abierta?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19975</th>\n",
       "      <td>and you send a email to seller with my email i...</td>\n",
       "      <td>y usted envía un correo electrónico al vendedo...</td>\n",
       "      <td>how am i going to send email to you</td>\n",
       "      <td>¿Cómo te enviaré un correo electrónico?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19976</th>\n",
       "      <td>So i contact the seller i want my money back</td>\n",
       "      <td>Entonces me pongo en contacto con el vendedor ...</td>\n",
       "      <td>The goods are defective. I want my money back ...</td>\n",
       "      <td>Los productos son defectuosos Quiero mi dinero...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19977</th>\n",
       "      <td>I want a real person &amp;amp; NOT a robot.</td>\n",
       "      <td>Quiero una persona real y amp; NO es un robot.</td>\n",
       "      <td>i want to talk to a real person</td>\n",
       "      <td>quiero hablar con una persona real</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19978</th>\n",
       "      <td>did you even give a answer</td>\n",
       "      <td>¿Has dado una respuesta?</td>\n",
       "      <td>I opened dispute but did not get an answer</td>\n",
       "      <td>Abrí la disputa pero no recibí una respuesta</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19979</th>\n",
       "      <td>the same thing happen to me with the chinese s...</td>\n",
       "      <td>Me pasa lo mismo con los vendedores chinos en ...</td>\n",
       "      <td>sellers do not send me my order</td>\n",
       "      <td>los vendedores no me envían mi pedido</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19980</th>\n",
       "      <td>How to ship back the item</td>\n",
       "      <td>Cómo devolver el artículo</td>\n",
       "      <td>How can I ship to China?</td>\n",
       "      <td>¿Cómo puedo enviar a China?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19981</th>\n",
       "      <td>how to subscribed</td>\n",
       "      <td>cómo suscribirse</td>\n",
       "      <td>How to be affiliate</td>\n",
       "      <td>Cómo ser afiliado</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19982</th>\n",
       "      <td>I can not upload videos or photos to the dispute</td>\n",
       "      <td>No puedo subir videos o fotos a la disputa</td>\n",
       "      <td>how do I upload my video in response to a medi...</td>\n",
       "      <td>¿Cómo cargo mi video en respuesta a una disput...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19983</th>\n",
       "      <td>ok...I have a question for you</td>\n",
       "      <td>ok ... tengo una pregunta para ti</td>\n",
       "      <td>I have a question can you help?</td>\n",
       "      <td>Tengo una pregunta, ¿puedes ayudarme?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19984</th>\n",
       "      <td>ja watch for me</td>\n",
       "      <td>mira por mí</td>\n",
       "      <td>Please call me.</td>\n",
       "      <td>Por favor, llámame.</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19985</th>\n",
       "      <td>How to register an account</td>\n",
       "      <td>Cómo registrar una cuenta</td>\n",
       "      <td>How can I register account?</td>\n",
       "      <td>¿Cómo puedo registrar mi cuenta?</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19986</th>\n",
       "      <td>How can I collect my order in cart?</td>\n",
       "      <td>¿Cómo puedo recoger mi pedido en el carrito?</td>\n",
       "      <td>How can I move wish item list to my cart?</td>\n",
       "      <td>¿Cómo puedo mover la lista de artículos desead...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19987</th>\n",
       "      <td>How change post code</td>\n",
       "      <td>Cómo cambiar el código postal</td>\n",
       "      <td>How do I pay with post pay?</td>\n",
       "      <td>¿Cómo pago con pospago?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19988</th>\n",
       "      <td>via bank card</td>\n",
       "      <td>a través de una tarjeta bancaria</td>\n",
       "      <td>What is a copy of the bank statement for the c...</td>\n",
       "      <td>¿Qué es una copia del extracto bancario de la ...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19989</th>\n",
       "      <td>Where do I find settings to manage payment cards</td>\n",
       "      <td>¿Dónde encuentro configuraciones para administ...</td>\n",
       "      <td>Where do I manage my photo?</td>\n",
       "      <td>¿Dónde administro mi foto?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19990</th>\n",
       "      <td>i cant track my orders</td>\n",
       "      <td>no puedo rastrear mis pedidos</td>\n",
       "      <td>Can I track my order?</td>\n",
       "      <td>¿Puedo rastrear mi pedido?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19991</th>\n",
       "      <td>My card keeps getting denied, how do I fix that?</td>\n",
       "      <td>Mi tarjeta sigue siendo denegada, ¿cómo puedo ...</td>\n",
       "      <td>How can I do if my card is stolen?</td>\n",
       "      <td>¿Cómo puedo hacer si me roban mi tarjeta?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19992</th>\n",
       "      <td>i can't find it</td>\n",
       "      <td>no puedo encontrarlo</td>\n",
       "      <td>i cant call you</td>\n",
       "      <td>no puedo llamarte</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19993</th>\n",
       "      <td>It never get frozen it goes to pay and it is p...</td>\n",
       "      <td>Nunca se congela, va a pagar y se paga al inst...</td>\n",
       "      <td>what happen when my order get frozen?</td>\n",
       "      <td>¿Qué sucede cuando mi pedido se congela?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19994</th>\n",
       "      <td>this is getting no where</td>\n",
       "      <td>esto no está llegando a ningún lado</td>\n",
       "      <td>My order keeps getting cancelled and I am not ...</td>\n",
       "      <td>Mi orden sigue siendo cancelada y no me devuel...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19995</th>\n",
       "      <td>how to remove credit card information?</td>\n",
       "      <td>cómo eliminar la información de la tarjeta de ...</td>\n",
       "      <td>How to pay with credit card?</td>\n",
       "      <td>¿Cómo pagar con tarjeta de crédito?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19996</th>\n",
       "      <td>Didnt say anything about email</td>\n",
       "      <td>No dije nada sobre el correo electrónico</td>\n",
       "      <td>When I receive email with my order i click on ...</td>\n",
       "      <td>Cuando recibo un correo electrónico con mi ord...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19997</th>\n",
       "      <td>how to add evidence to dispute?</td>\n",
       "      <td>cómo agregar evidencia a disputa?</td>\n",
       "      <td>how to add friends by TM</td>\n",
       "      <td>cómo agregar amigos por TM</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19998</th>\n",
       "      <td>When I open a dispute it says Order empty</td>\n",
       "      <td>Cuando abro una disputa, dice Order empty</td>\n",
       "      <td>I cannot open dispute for order in Awaiting De...</td>\n",
       "      <td>No puedo abrir una disputa por orden en Espera...</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19999</th>\n",
       "      <td>i need to speak with someone</td>\n",
       "      <td>necesito hablar con alguien</td>\n",
       "      <td>do you speak spanish?</td>\n",
       "      <td>¿hablas español?</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>20000 rows × 5 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                   eng_1  \\\n",
       "0                     hello, i click in product received   \n",
       "1      Hello! I have closed the dispute on may 21, 20...   \n",
       "2      l ordered from spain to spain now they send th...   \n",
       "3                           Do I need to pay custom duty   \n",
       "4                             I didn't receive my order?   \n",
       "5      Hi Eva. At first the question. Can I write in ...   \n",
       "6                                          I am so angry   \n",
       "7                          I am not able to open dispute   \n",
       "8                          how can I check order number?   \n",
       "9                         No, I need an answer from you.   \n",
       "10                               how to reply to dispute   \n",
       "11               I DONT NOT LIVE IN CHINA, I LIVE BRAZIL   \n",
       "12      What does it mean: Your order will be closed in?   \n",
       "13                                 how to exchange coins   \n",
       "14                        how do I report a fraud seller   \n",
       "15     Hi I want to buy something but seller have to ...   \n",
       "16       How do I know whether my order has been shipped   \n",
       "17          i cancelled my order with the seller already   \n",
       "18     l ordered from spain to spain now they send th...   \n",
       "19                      I want to do shopping how to buy   \n",
       "20     Hi, I live in Canada and I'm currently trackin...   \n",
       "21     The promotion began, but why the price of prod...   \n",
       "22                                the color number was L   \n",
       "23                         i have done done all tracking   \n",
       "24                  My forms and documents are not going   \n",
       "25                                    how to place order   \n",
       "26           impossible to join contact customer support   \n",
       "27                      I want to do shopping how to buy   \n",
       "28                         I am not able to open dispute   \n",
       "29                        my order isn't being processed   \n",
       "...                                                  ...   \n",
       "19970           hi, i see this link but i have question.   \n",
       "19971             ok please. or i can ask the other one.   \n",
       "19972            I paid my order several times, because?   \n",
       "19973                 How do I exchange coins for coupon   \n",
       "19974                                link open a dispute   \n",
       "19975  and you send a email to seller with my email i...   \n",
       "19976       So i contact the seller i want my money back   \n",
       "19977            I want a real person &amp; NOT a robot.   \n",
       "19978                         did you even give a answer   \n",
       "19979  the same thing happen to me with the chinese s...   \n",
       "19980                          How to ship back the item   \n",
       "19981                                  how to subscribed   \n",
       "19982   I can not upload videos or photos to the dispute   \n",
       "19983                     ok...I have a question for you   \n",
       "19984                                    ja watch for me   \n",
       "19985                         How to register an account   \n",
       "19986                How can I collect my order in cart?   \n",
       "19987                               How change post code   \n",
       "19988                                      via bank card   \n",
       "19989   Where do I find settings to manage payment cards   \n",
       "19990                             i cant track my orders   \n",
       "19991   My card keeps getting denied, how do I fix that?   \n",
       "19992                                    i can't find it   \n",
       "19993  It never get frozen it goes to pay and it is p...   \n",
       "19994                           this is getting no where   \n",
       "19995             how to remove credit card information?   \n",
       "19996                     Didnt say anything about email   \n",
       "19997                    how to add evidence to dispute?   \n",
       "19998          When I open a dispute it says Order empty   \n",
       "19999                       i need to speak with someone   \n",
       "\n",
       "                                                   spn_1  \\\n",
       "0                hola, hago clic en el producto recibido   \n",
       "1      ¡Hola! Cerré la disputa el 21 de mayo de 2017 ...   \n",
       "2      Ordené de España a España ahora que mandan el ...   \n",
       "3                  ¿Debo pagar impuestos personalizados?   \n",
       "4                                   No recibí mi pedido?   \n",
       "5      Hola Eva Al principio la pregunta. ¿Puedo escr...   \n",
       "6                                      estoy tan enojado   \n",
       "7                             No puedo abrir una disputa   \n",
       "8             ¿Cómo puedo verificar el número de pedido?   \n",
       "9                       No, necesito una respuesta tuya.   \n",
       "10                          cómo responder a una disputa   \n",
       "11                         NO VIVO EN CHINA, VIVO BRASIL   \n",
       "12                ¿Qué significa: su orden será cerrada?   \n",
       "13                             cómo intercambiar monedas   \n",
       "14                ¿Cómo informo a un vendedor de fraude?   \n",
       "15     Hola, quiero comprar algo, pero el vendedor ti...   \n",
       "16       ¿Cómo puedo saber si mi pedido ha sido enviado?   \n",
       "17                  cancelé mi pedido con el vendedor ya   \n",
       "18     Ordené de España a España ahora que mandan el ...   \n",
       "19                     Quiero hacer compras cómo comprar   \n",
       "20     Hola, vivo en Canadá y actualmente estoy rastr...   \n",
       "21     La promoción comenzó, pero ¿por qué el precio ...   \n",
       "22                              el número de color era L   \n",
       "23                          He hecho todo el seguimiento   \n",
       "24                   Mis formularios y documentos no van   \n",
       "25                                  cómo hacer un pedido   \n",
       "26     imposible unirse a la atención al cliente de c...   \n",
       "27                     Quiero hacer compras cómo comprar   \n",
       "28                            No puedo abrir una disputa   \n",
       "29                    mi pedido no está siendo procesado   \n",
       "...                                                  ...   \n",
       "19970     hola, veo este enlace pero tengo una pregunta.   \n",
       "19971  De acuerdo por favor. o puedo preguntarle al o...   \n",
       "19972              Pagué mi pedido varias veces, porque?   \n",
       "19973                    ¿Cómo cambio monedas por cupón?   \n",
       "19974                           enlace abrir una disputa   \n",
       "19975  y usted envía un correo electrónico al vendedo...   \n",
       "19976  Entonces me pongo en contacto con el vendedor ...   \n",
       "19977     Quiero una persona real y amp; NO es un robot.   \n",
       "19978                           ¿Has dado una respuesta?   \n",
       "19979  Me pasa lo mismo con los vendedores chinos en ...   \n",
       "19980                          Cómo devolver el artículo   \n",
       "19981                                   cómo suscribirse   \n",
       "19982         No puedo subir videos o fotos a la disputa   \n",
       "19983                  ok ... tengo una pregunta para ti   \n",
       "19984                                        mira por mí   \n",
       "19985                          Cómo registrar una cuenta   \n",
       "19986       ¿Cómo puedo recoger mi pedido en el carrito?   \n",
       "19987                      Cómo cambiar el código postal   \n",
       "19988                   a través de una tarjeta bancaria   \n",
       "19989  ¿Dónde encuentro configuraciones para administ...   \n",
       "19990                      no puedo rastrear mis pedidos   \n",
       "19991  Mi tarjeta sigue siendo denegada, ¿cómo puedo ...   \n",
       "19992                               no puedo encontrarlo   \n",
       "19993  Nunca se congela, va a pagar y se paga al inst...   \n",
       "19994                esto no está llegando a ningún lado   \n",
       "19995  cómo eliminar la información de la tarjeta de ...   \n",
       "19996           No dije nada sobre el correo electrónico   \n",
       "19997                  cómo agregar evidencia a disputa?   \n",
       "19998          Cuando abro una disputa, dice Order empty   \n",
       "19999                        necesito hablar con alguien   \n",
       "\n",
       "                                                   eng_2  \\\n",
       "0      I bought a product and have not received a con...   \n",
       "1      I did not get refund of my money. Two months h...   \n",
       "2      My order came but color different from that I ...   \n",
       "3                                How to pay customs duty   \n",
       "4         My order shows that I have not paid, but I did   \n",
       "5                How can I write feedback for the goods?   \n",
       "6                  I opened a dispute and so far nothing   \n",
       "7                                I am not able to track.   \n",
       "8        Where I can see the number of my order tracker?   \n",
       "9      I need an invoice for this item i bought from you   \n",
       "10                           How do I reply to feedback?   \n",
       "11                               i want live contact now   \n",
       "12              tracking order what does collection mean   \n",
       "13                    How to change my coins for coupon?   \n",
       "14                               I want to report seller   \n",
       "15          hi i need to tell u something about my order   \n",
       "16               How can I know if my order was shipped?   \n",
       "17                      I have already paid for my order   \n",
       "18                             I'm a supplier from china   \n",
       "19                       i will come to see you tomorrow   \n",
       "20     When can I receive my package after the produc...   \n",
       "21               Why the promotion price is not changed?   \n",
       "22                              How can l see my message   \n",
       "23     I have a dispute and the company has done noth...   \n",
       "24                 When am I going to receive my orders?   \n",
       "25                                 How do I place order?   \n",
       "26                   how can I contact customer support?   \n",
       "27                                What is shopping cart?   \n",
       "28         I am not able to attach a photo for a dispute   \n",
       "29                   My debit card is not being accepted   \n",
       "...                                                  ...   \n",
       "19970                           please i have a question   \n",
       "19971               Can I see wish list of other people?   \n",
       "19972  I opened the dispute because I have not receiv...   \n",
       "19973                 How to change my coins for coupon?   \n",
       "19974                     how to cancel an open dispute?   \n",
       "19975                how am i going to send email to you   \n",
       "19976  The goods are defective. I want my money back ...   \n",
       "19977                    i want to talk to a real person   \n",
       "19978         I opened dispute but did not get an answer   \n",
       "19979                    sellers do not send me my order   \n",
       "19980                           How can I ship to China?   \n",
       "19981                                How to be affiliate   \n",
       "19982  how do I upload my video in response to a medi...   \n",
       "19983                    I have a question can you help?   \n",
       "19984                                    Please call me.   \n",
       "19985                        How can I register account?   \n",
       "19986          How can I move wish item list to my cart?   \n",
       "19987                        How do I pay with post pay?   \n",
       "19988  What is a copy of the bank statement for the c...   \n",
       "19989                        Where do I manage my photo?   \n",
       "19990                              Can I track my order?   \n",
       "19991                 How can I do if my card is stolen?   \n",
       "19992                                    i cant call you   \n",
       "19993              what happen when my order get frozen?   \n",
       "19994  My order keeps getting cancelled and I am not ...   \n",
       "19995                       How to pay with credit card?   \n",
       "19996  When I receive email with my order i click on ...   \n",
       "19997                           how to add friends by TM   \n",
       "19998  I cannot open dispute for order in Awaiting De...   \n",
       "19999                              do you speak spanish?   \n",
       "\n",
       "                                                   spn_2  label  \n",
       "0      Compré un producto y no he recibido un correo ...      0  \n",
       "1      No obtuve el reembolso de mi dinero. Han pasad...      0  \n",
       "2      Mi pedido llegó pero el color es diferente al ...      0  \n",
       "3                      Cómo pagar los derechos de aduana      1  \n",
       "4       Mi pedido muestra que no he pagado, pero lo hice      0  \n",
       "5      ¿Cómo puedo escribir comentarios para los prod...      0  \n",
       "6                    Abrí una disputa y hasta ahora nada      0  \n",
       "7                                     No puedo rastrear.      0  \n",
       "8      ¿Dónde puedo ver el número de mi rastreador de...      0  \n",
       "9      Necesito una factura por este artículo que te ...      0  \n",
       "10                     ¿Cómo respondo a los comentarios?      0  \n",
       "11                         quiero contacto en vivo ahora      0  \n",
       "12          orden de seguimiento qué significa colección      0  \n",
       "13                  ¿Cómo cambiar mis monedas por cupón?      1  \n",
       "14                           Quiero informar al vendedor      1  \n",
       "15             hola necesito decirte algo sobre mi orden      0  \n",
       "16           ¿Cómo puedo saber si mi pedido fue enviado?      1  \n",
       "17                                    Ya pagué mi pedido      0  \n",
       "18                             Soy un proveedor de china      0  \n",
       "19                                 vendré a verte mañana      0  \n",
       "20     ¿Cuándo puedo recibir mi paquete después de en...      0  \n",
       "21      ¿Por qué el precio de la promoción no se cambia?      1  \n",
       "22                           ¿Cómo puedo ver mi mensaje?      0  \n",
       "23     Tengo una disputa y la compañía no ha hecho na...      0  \n",
       "24                         ¿Cuándo recibiré mis pedidos?      0  \n",
       "25                                 ¿Cómo hago el pedido?      1  \n",
       "26     ¿Cómo puedo contactar al servicio de atención ...      1  \n",
       "27                        ¿Qué es un carrito de compras?      0  \n",
       "28           No puedo adjuntar una foto para una disputa      0  \n",
       "29          Mi tarjeta de débito no está siendo aceptada      0  \n",
       "...                                                  ...    ...  \n",
       "19970                       por favor tengo una pregunta      1  \n",
       "19971   ¿Puedo ver la lista de deseos de otras personas?      0  \n",
       "19972  Abrí la disputa porque no recibí mi número de ...      0  \n",
       "19973               ¿Cómo cambiar mis monedas por cupón?      1  \n",
       "19974                 cómo cancelar una disputa abierta?      0  \n",
       "19975            ¿Cómo te enviaré un correo electrónico?      0  \n",
       "19976  Los productos son defectuosos Quiero mi dinero...      0  \n",
       "19977                 quiero hablar con una persona real      1  \n",
       "19978       Abrí la disputa pero no recibí una respuesta      0  \n",
       "19979              los vendedores no me envían mi pedido      0  \n",
       "19980                        ¿Cómo puedo enviar a China?      0  \n",
       "19981                                  Cómo ser afiliado      0  \n",
       "19982  ¿Cómo cargo mi video en respuesta a una disput...      0  \n",
       "19983              Tengo una pregunta, ¿puedes ayudarme?      1  \n",
       "19984                                Por favor, llámame.      0  \n",
       "19985                   ¿Cómo puedo registrar mi cuenta?      1  \n",
       "19986  ¿Cómo puedo mover la lista de artículos desead...      0  \n",
       "19987                            ¿Cómo pago con pospago?      0  \n",
       "19988  ¿Qué es una copia del extracto bancario de la ...      0  \n",
       "19989                         ¿Dónde administro mi foto?      0  \n",
       "19990                         ¿Puedo rastrear mi pedido?      0  \n",
       "19991          ¿Cómo puedo hacer si me roban mi tarjeta?      0  \n",
       "19992                                  no puedo llamarte      0  \n",
       "19993           ¿Qué sucede cuando mi pedido se congela?      0  \n",
       "19994  Mi orden sigue siendo cancelada y no me devuel...      0  \n",
       "19995                ¿Cómo pagar con tarjeta de crédito?      0  \n",
       "19996  Cuando recibo un correo electrónico con mi ord...      0  \n",
       "19997                         cómo agregar amigos por TM      0  \n",
       "19998  No puedo abrir una disputa por orden en Espera...      0  \n",
       "19999                                   ¿hablas español?      0  \n",
       "\n",
       "[20000 rows x 5 columns]"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dl = DataLoader()\n",
    "dl.load_dataset(eng_train)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Err on  ['talk', '·']\n",
      "Err on  ['τ', '•']\n",
      "Err on  ['—machine', 'elf']\n",
      "Err on  ['–', 'editør']\n",
      "Err on  ['html', 'is']\n",
      "Err on  ['ã¥â¼â\\x80ã¥â¥â\\x96ã¥â', 'â¬ã¥â\\x91â\\x8a']\n",
      "Err on  ['gimnã', 'stic']\n",
      "Err on  ['ã\\x90â´ã\\x90â»ã\\x91â\\x8fã\\x90â¸ã\\x91â\\x81ã\\x90âºã\\x90â»ã\\x91â\\x8eã\\x91â\\x87ã\\x90âµã\\x90â½ã\\x90â¸ã\\x91â\\x8fã\\x90â¾ã\\x90â±ã\\x91â', 'ã\\x90â¾ã\\x90â´ã\\x90â¾ã\\x90â²']\n",
      "Err on  ['ã\\x90â´ã\\x90â»ã\\x91â\\x8fã\\x90â¸ã\\x91â\\x81ã\\x90âºã\\x90â»ã\\x91â\\x8eã\\x91â\\x87ã\\x90âµã\\x90â½ã\\x90â¸ã\\x91â\\x8fã\\x90â¾ã\\x90â±ã\\x91â', 'ã\\x90â¾ã\\x90â´ã\\x90â¾ã\\x90â²ã\\x91â\\x81ã\\x90â¿ã\\x90â°ã\\x90â¼']\n",
      "Err on  ['ã\\x90â\\x9fã\\x91â\\x80ã\\x90â¸ã\\x90â½ã\\x90âµã\\x90â¾ã\\x90â±ã\\x91â', 'ã\\x90â¾ã\\x90â´ã\\x90â¸ã\\x90â¼ã\\x90â¾ã\\x91â\\x81ã\\x91â\\x82ã\\x90â¸ã\\x90â¸ã\\x91â\\x81ã\\x90âºã\\x90â»ã\\x91â\\x8eã\\x91â\\x87ã\\x90âµã\\x90â½ã\\x90â¸ã\\x91â\\x8fã\\x90â±ã\\x91â\\x83ã\\x90â´ã\\x91â\\x83ã\\x91â\\x82ã\\x91â\\x81ã\\x90â¾ã\\x90â·ã\\x90â´ã\\x90â°ã\\x90â½ã\\x91â\\x8b']\n",
      "Err on  ['keikyū', 'kakuekiteisha']\n",
      "Err on  ['—', 'i']\n",
      "Err on  ['talk', '»']\n",
      "Err on  ['—', 'it']\n",
      "Err on  ['–', 'archived']\n",
      "Err on  ['–', 'kerαunoςcopia◁galaxies']\n",
      "Err on  ['vandalism', '–']\n",
      "Err on  ['–', 'i']\n",
      "Err on  ['wikipedia,', 'https']\n",
      "Err on  ['wikipedia', 'and']\n",
      "Err on  ['sources', 'and']\n",
      "Err on  ['—', 'тαʟκ✍']\n",
      "Err on  ['—', 'the']\n",
      "Err on  ['com/news/ã¤â¸â\\x8aã¦âµâ·ã¦â\\x90â¬ã¥â®â¶ã¥â', 'â¬ã¥â\\x8fâ¸']\n",
      "Err on  ['the', 'https']\n",
      "Err on  ['see', 'https']\n",
      "Err on  ['—', 'but']\n",
      "Err on  ['å\\x86', 'æ\\x8a½ç\\x9c\\x9fç©ºå\\x8c']\n",
      "Err on  ['com/up/ù', 'ø±ù\\x83ø²']\n",
      "Err on  ['#', 'the']\n",
      "Err on  ['^', 'jump']\n",
      "Err on  ['–', 'it']\n",
      "Err on  ['nguyá»', 'n']\n",
      "Err on  ['doctrine', 'and']\n",
      "Err on  ['ð', 'ð°ñ\\x81ñ\\x81ñ\\x8bð»ðºð¸']\n",
      "Err on  ['book', 'of']\n",
      "Err on  ['—', 'and']\n",
      "Err on  [',', 'isbn']\n",
      "Err on  ['‒', 'jaymax✍']\n",
      "Err on  ['miã', 's']\n",
      "Err on  ['the', 'university']\n",
      "Err on  ['jesus', 'christ']\n",
      "Err on  ['–', 'the']\n",
      "Err on  ['—', 'irrelevant']\n",
      "Err on  ['–', 'and']\n",
      "Err on  ['ryã', 'â']\n",
      "Err on  ['/ã\\x99â\\x87ã\\x99â', 'ã\\x9aâ©ã\\x98â§ã\\x98â±ã\\x9bâ\\x8c']\n",
      "Err on  ['w', 'krakowie']\n",
      "Err on  ['i', 'would']\n",
      "Err on  ['php/despre_plutrocaã', 'â£ie_ã']\n",
      "Err on  ['—', '✈']\n",
      "Err on  ['—', 'you']\n",
      "Err on  ['shã', 'â\\x8djo']\n",
      "Err on  ['–', '@']\n",
      "Err on  ['org/wiki/ù', 'ù\\x86øªø¯ù\\x89_ø§ù\\x84ø¬ø²ù\\x8aø±ø©_øªù\\x88ù\\x83']\n",
      "Err on  ['–', 'this']\n",
      "Err on  ['war', 'ii']\n",
      "Err on  ['th', 'century']\n",
      "Err on  ['å', 'tambuk']\n",
      "Err on  ['—', 'as']\n",
      "Err on  ['–', 'which']\n",
      "Err on  ['–', 'but']\n",
      "Err on  ['org/wiki/ù\\x82ø§ù\\x86ù\\x88ù\\x86_ø§ø³ø§ø³û\\x8c_ø¬ù', 'ù\\x87ù\\x88ø±û\\x8c_ø§ø³ù\\x84ø§ù']\n",
      "Err on  ['i', 'do']\n",
      "Err on  ['–', 'a']\n",
      "Err on  ['ã\\x99â', 'ã\\x99â\\x86ã\\x98âªã\\x98â¸ã\\x98â±ã\\x9bâ\\x8c']\n",
      "Err on  ['ã\\x98â§ã\\x98â¹ã\\x99â\\x84ã\\x98â§ã\\x99â', 'ã\\x9bâ\\x8cã\\x99â\\x87']\n",
      "Err on  ['—', 'a']\n",
      "Err on  ['—', 'in']\n",
      "Err on  ['braã', 'â\\x9fov']\n",
      "Err on  ['tv', 'ribia']\n",
      "Err on  ['ñ\\x81ð°ð¹ñ\\x82ñ\\x87ðµñ\\x87ðµð½ñ\\x81ðºð¸ñ', 'ñ\\x82ðµñ\\x80ñ\\x80ð¾ñ\\x80ð¸ñ\\x81ñ\\x82ð¾ð²']\n",
      "Err on  ['championship', 'champions']\n",
      "Err on  ['com/shã', 'â\\x8djo_manga/japan_quarterly/index']\n",
      "Err on  ['h', 'e']\n",
      "Err on  ['at', 'https']\n",
      "Err on  ['–', 'is']\n",
      "Err on  ['æ\\x9d¥ã\\x81¦ã\\x81\\x8fã\\x81', 'ã\\x81\\x95ã\\x81\\x84ã\\x80\\x82']\n",
      "Err on  ['cracow', 'university']\n",
      "Err on  ['–', 'in']\n",
      "Err on  ['i', 'think']\n",
      "Err on  [',', '−']\n",
      "Err on  ['press,', 'albuquerque']\n",
      "Err on  ['liangchun', 'and']\n",
      "Err on  ['and', 'the']\n",
      "Err on  ['machine', 'elf']\n",
      "Err on  ['drniã', 'â¡']\n",
      "Err on  ['carnivã', 'le']\n",
      "Err on  ['—', 'they']\n",
      "Err on  ['三藏法師玄奘奉', '詔譯']\n",
      "Err on  ['ù', 'ø¬ù']\n",
      "Err on  ['—', 'which']\n",
      "Err on  ['in', 'https']\n",
      "Err on  ['–', 'no']\n",
      "Err on  ['–', 'not']\n",
      "Err on  ['book', 'of']\n",
      "Err on  ['—', 'he']\n",
      "Err on  ['ã', 'â\\x9eampiyonu']\n",
      "Err on  ['_×ª×\\x95×\\x9b×', '×\\x99×ª_×\\x9e×¡â\\x80\\x99_']\n",
      "Err on  ['—', 'is']\n",
      "Err on  ['—', 'if']\n",
      "Err on  ['•', 'cleves']\n",
      "Err on  ['t', 'h']\n",
      "Err on  ['from', 'https']\n",
      "Err on  ['the', 'international']\n",
      "Err on  ['·', 'the']\n",
      "Err on  ['/ã', 'â¨â\\x9cã']\n",
      "Err on  ['com/ã', 'â¹â\\x80ã']\n",
      "Err on  ['ã', 'â\\x9awidermajer']\n",
      "Err on  [',', 'isbn']\n",
      "Err on  ['fu', '武術季刊誌《武術']\n",
      "Err on  ['com/ã©â\\x98â¿ã©â\\x87â\\x8cã¥â±â±ã¥â', 'â¨ã¦â\\x96â¹ã¤â½â\\x8dã¦â\\x97â']\n",
      "Err on  ['com/ø¥ø³øªù', 'ø¹']\n",
      "Err on  ['–', 'missouri']\n",
      "Err on  [',', 'and']\n",
      "Err on  ['ã', 'â']\n",
      "Err on  ['brigham', 'young']\n",
      "Err on  ['premier', 'runners']\n",
      "Err on  ['jp', 'ｎｐｏ法人日本土壌の会']\n",
      "Err on  ['lds', 'sources']\n",
      "Err on  ['com/ù', 'ø±ú©ø²']\n",
      "Err on  ['kruã', 'â¡evac']\n",
      "Err on  ['eskiã', 'â\\x9fehirspor']\n",
      "Err on  ['i', 'am']\n",
      "Err on  ['sockpuppetry', '–']\n",
      "Err on  ['a', 'https']\n",
      "Err on  ['fã', 'bregas']\n",
      "Err on  ['zbigniew', 'paszek']\n",
      "Err on  ['htmlã', 'â®â\\x87ã']\n",
      "Err on  ['—', 'fails']\n",
      "Err on  ['—', 'to']\n",
      "Err on  ['raã', 'â¾natoviã\\x84â\\x87']\n",
      "Err on  ['—', 'there']\n",
      "Err on  [',', 'the']\n",
      "Err on  ['ã', 'â¸â¥ã']\n",
      "Err on  ['·', 'professor']\n",
      "Err on  ['htmlã£â\\x80â\\x8dã£â\\x82â\\x92ã¥â\\x8fâ\\x82ã§â', 'â§']\n",
      "Err on  ['history', 'of']\n",
      "Err on  ['ð\\x9cñ\\x83ñ\\x81ð¸ð½_ð\\x9cð¸ñ', 'ð°ð¸ð»_ð\\x9dð°ð´ð¸ð¼ð¾ð²ð¸ñ\\x87']\n",
      "Err on  ['ã', 'â\\x9e']\n",
      "Err on  ['for', 'the']\n",
      "Err on  ['—', 'like']\n",
      "Err on  ['jp/ã¦â', 'âªã¥â¼â\\x8fã¤â¼â\\x9aã§â¤â¾']\n",
      "Err on  ['the', 'internet']\n",
      "Err on  ['tomã', 's']\n",
      "Err on  ['gumi', 'inheritance']\n",
      "Err on  ['hō', 'hassha']\n",
      "Err on  ['engineer', 'needs']\n",
      "Err on  ['—', 'one']\n",
      "Err on  ['i', 'could']\n",
      "Err on  ['—', 'see']\n",
      "Err on  ['–', 'as']\n",
      "Err on  ['wyrwaã', 'â\\x82']\n",
      "Err on  ['arabes/ã\\x98â£ã\\x99â', '%']\n",
      "Err on  ['–', 'keep']\n",
      "Err on  ['–', 'if']\n",
      "Err on  ['—', 'so']\n",
      "Err on  ['the', 'lost']\n",
      "Err on  ['org/wikibooks/ru/wiki/ã\\x90â\\x97ã\\x90â°ã\\x91â\\x89ã\\x90â¸ã\\x91â\\x82ã\\x90â°_ã\\x90âºã\\x90â¾ã\\x90â½ã\\x91â\\x84ã\\x90â¸ã\\x90â´ã\\x90âµã\\x90â½ã\\x91â\\x86ã\\x90â¸ã\\x90â°ã\\x90â»ã\\x91â\\x8cã\\x90â½ã\\x91â\\x8bã\\x91â', '_ã\\x90â´ã\\x90â°ã\\x90â½ã\\x90â½ã\\x91â\\x8bã\\x91â']\n",
      "Total 2518802 word vectors.\n"
     ]
    }
   ],
   "source": [
    "embedding = dl.load_embedding(embedding_path=\"wordvec/wiki.en.vec\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Total words 2518802\n",
      "Embedding size 300\n",
      "Note that this embedding has performed lower casting.\n"
     ]
    }
   ],
   "source": [
    "print(\"Total words\", len(embedding))\n",
    "print(\"Embedding size\", len(embedding['i']))\n",
    "print(\"Note that this embedding has performed lower casting.\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.1"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
